1   package org.apache.lucene.index;
2   
3   /*
4    * Licensed to the Apache Software Foundation (ASF) under one or more
5    * contributor license agreements.  See the NOTICE file distributed with
6    * this work for additional information regarding copyright ownership.
7    * The ASF licenses this file to You under the Apache License, Version 2.0
8    * (the "License"); you may not use this file except in compliance with
9    * the License.  You may obtain a copy of the License at
10   *
11   *     http://www.apache.org/licenses/LICENSE-2.0
12   *
13   * Unless required by applicable law or agreed to in writing, software
14   * distributed under the License is distributed on an "AS IS" BASIS,
15   * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16   * See the License for the specific language governing permissions and
17   * limitations under the License.
18   */
19  
20  import org.apache.lucene.util.Version;
21  
22  import java.io.IOException;
23  import java.util.ArrayList;
24  import java.util.List;
25  import java.util.Map;
26  import java.util.HashMap;
27  
28  /** This {@link MergePolicy} is used for upgrading all existing segments of
29    * an index when calling {@link IndexWriter#forceMerge(int)}.
30    * All other methods delegate to the base {@code MergePolicy} given to the constructor.
31    * This allows for an as-cheap-as possible upgrade of an older index by only upgrading segments that
32    * are created by previous Lucene versions. forceMerge does no longer really merge;
33    * it is just used to "forceMerge" older segment versions away.
34    * <p>In general one would use {@link IndexUpgrader}, but for a fully customizeable upgrade,
35    * you can use this like any other {@code MergePolicy} and call {@link IndexWriter#forceMerge(int)}:
36    * <pre class="prettyprint lang-java">
37    *  IndexWriterConfig iwc = new IndexWriterConfig(Version.LUCENE_XX, new KeywordAnalyzer());
38    *  iwc.setMergePolicy(new UpgradeIndexMergePolicy(iwc.getMergePolicy()));
39    *  IndexWriter w = new IndexWriter(dir, iwc);
40    *  w.forceMerge(1);
41    *  w.close();
42    * </pre>
43    * <p><b>Warning:</b> This merge policy may reorder documents if the index was partially
44    * upgraded before calling forceMerge (e.g., documents were added). If your application relies
45    * on &quot;monotonicity&quot; of doc IDs (which means that the order in which the documents
46    * were added to the index is preserved), do a forceMerge(1) instead. Please note, the
47    * delegate {@code MergePolicy} may also reorder documents.
48    * @lucene.experimental
49    * @see IndexUpgrader
50    */
51  public class UpgradeIndexMergePolicy extends MergePolicy {
52  
53    /** Wrapped {@link MergePolicy}. */
54    protected final MergePolicy base;
55  
56    /** Wrap the given {@link MergePolicy} and intercept forceMerge requests to
57     * only upgrade segments written with previous Lucene versions. */
58    public UpgradeIndexMergePolicy(MergePolicy base) {
59      this.base = base;
60    }
61    
62    /** Returns if the given segment should be upgraded. The default implementation
63     * will return {@code !Version.LATEST.equals(si.getVersion())},
64     * so all segments created with a different version number than this Lucene version will
65     * get upgraded.
66     */
67    protected boolean shouldUpgradeSegment(SegmentCommitInfo si) {
68      return !Version.LATEST.equals(si.info.getVersion());
69    }
70  
71    @Override
72    public MergeSpecification findMerges(MergeTrigger mergeTrigger, SegmentInfos segmentInfos, IndexWriter writer) throws IOException {
73      return base.findMerges(null, segmentInfos, writer);
74    }
75    
76    @Override
77    public MergeSpecification findForcedMerges(SegmentInfos segmentInfos, int maxSegmentCount, Map<SegmentCommitInfo,Boolean> segmentsToMerge, IndexWriter writer) throws IOException {
78      // first find all old segments
79      final Map<SegmentCommitInfo,Boolean> oldSegments = new HashMap<>();
80      for (final SegmentCommitInfo si : segmentInfos) {
81        final Boolean v = segmentsToMerge.get(si);
82        if (v != null && shouldUpgradeSegment(si)) {
83          oldSegments.put(si, v);
84        }
85      }
86      
87      if (verbose(writer)) {
88        message("findForcedMerges: segmentsToUpgrade=" + oldSegments, writer);
89      }
90        
91      if (oldSegments.isEmpty())
92        return null;
93  
94      MergeSpecification spec = base.findForcedMerges(segmentInfos, maxSegmentCount, oldSegments, writer);
95      
96      if (spec != null) {
97        // remove all segments that are in merge specification from oldSegments,
98        // the resulting set contains all segments that are left over
99        // and will be merged to one additional segment:
100       for (final OneMerge om : spec.merges) {
101         oldSegments.keySet().removeAll(om.segments);
102       }
103     }
104 
105     if (!oldSegments.isEmpty()) {
106       if (verbose(writer)) {
107         message("findForcedMerges: " +  base.getClass().getSimpleName() +
108         " does not want to merge all old segments, merge remaining ones into new segment: " + oldSegments, writer);
109       }
110       final List<SegmentCommitInfo> newInfos = new ArrayList<>();
111       for (final SegmentCommitInfo si : segmentInfos) {
112         if (oldSegments.containsKey(si)) {
113           newInfos.add(si);
114         }
115       }
116       // add the final merge
117       if (spec == null) {
118         spec = new MergeSpecification();
119       }
120       spec.add(new OneMerge(newInfos));
121     }
122 
123     return spec;
124   }
125   
126   @Override
127   public MergeSpecification findForcedDeletesMerges(SegmentInfos segmentInfos, IndexWriter writer) throws IOException {
128     return base.findForcedDeletesMerges(segmentInfos, writer);
129   }
130   
131   @Override
132   public boolean useCompoundFile(SegmentInfos segments, SegmentCommitInfo newSegment, IndexWriter writer) throws IOException {
133     return base.useCompoundFile(segments, newSegment, writer);
134   }
135   
136   @Override
137   public String toString() {
138     return "[" + getClass().getSimpleName() + "->" + base + "]";
139   }
140   
141   private boolean verbose(IndexWriter writer) {
142     return writer != null && writer.infoStream.isEnabled("UPGMP");
143   }
144 
145   private void message(String message, IndexWriter writer) {
146     writer.infoStream.message("UPGMP", message);
147   }
148 }